Java 读取 RSS，顺便还有xpath的用法-白红宇

Java 读取 RSS，顺便还有xpath的用法

阅读量：4120 次

发布时间：2019-05-25

本文共 4933 字，大约阅读时间需要 16 分钟。

Java读取RSS：

//http://zfive.blogbus.com/logs/20959998.html
package com.yourcompany.struts.user;
import java.io.IOException;
import java.io.File;
import java.util.ArrayList;
import java.util.List;
import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
import org.w3c.dom.Node;
import org.w3c.dom.NodeList;
import org.xml.sax.SAXException;
import java.net.URL;
publicclass Test { 
publicstaticvoid main(String[] args) { 
try{ 
   List result = new ArrayList();  //声明一个结果集
   DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance(); //解析器工厂类
   DocumentBuilder db;
   Document doc;
  
   //此DocumentBuilder对象的作用是根据xml文件的url地址生成document对象
   db =dbf.newDocumentBuilder();     //得到一个DOM解析器对象;
    //File file = new File("students.xml"); //当然，我们也可以读出本地计算机中的xml文档
  
   //doc对象包含需要解析的feed的xml文件
   URL file = new URL("http://localhost:8080/rSS/pfocus.xml");
   
   doc = db.parse(file.openStream());  //把解析后的XML，赋给文档对象; 
   //feed的xml文件的组成单位是item,从doc中取出所有的item
   NodeList nl = doc.getElementsByTagName("item");  //多个<item>标签组成一个链表;
 
   for(int i=0;i<nl.getLength();i++)
   { 
    Element eltStu = (Element)nl.item(i);
    //此处得到元素中的<title></title>标签实体；
    Node titlenode = eltStu.getElementsByTagName("title").item(0);  
    //返回第一个节点的值;
      String title = titlenode.getFirstChild().getNodeValue();
    
    Node linknode = eltStu.getElementsByTagName("link").item(0);
    String link = linknode.getFirstChild().getNodeValue();
    
    Node descriptionnode = eltStu.getElementsByTagName("description").item(0);
    String description = descriptionnode.getFirstChild().getNodeValue();
    
    Node authornode = eltStu.getElementsByTagName("author").item(0);
    String author = authornode.getFirstChild().getNodeValue();
    
    
    System.out.println(title);
    System.out.println(author);
    System.out.println(link);
    System.out.println(description);
    System.out.println("---------");
      }
  }
   catch(ParserConfigurationException e)
   { 
    e.printStackTrace();
   }catch(SAXException e){ 
    e.printStackTrace();
   }catch(IOException e){ 
    e.printStackTrace();
   }finally{ 
   }
}
}

然后是xpath的部分：

import

java.io.IOException;

import

javax.xml.parsers.

;

import

javax.xml.xpath.

;

import

org.w3c.dom.

;

import

org.xml.sax.SAXException;

class

XpathSample {

public

static

void

main(String[] args)

throws

ParserConfigurationException,

SAXException, IOException, XPathExpressionException {

DocumentBuilderFactory factory

DocumentBuilderFactory.newInstance();

factory.setNamespaceAware(

true

);

DocumentBuilder builder

factory.newDocumentBuilder();

Document doc

builder.parse(

XmlFile/books.xml

);

XPathFactory xFactory

XPathFactory.newInstance();

XPath xpath

xFactory.newXPath();

XPathExpression expr

xpath

.compile(

//book[author='Neal Stephenson']/price/text()

);

Object result

expr.evaluate(doc, XPathConstants.NODESET);

NodeList nodes

(NodeList) result;

for

(

int

; i

nodes.getLength(); i

) {

System.out.println(nodes.item(i).getNodeValue());

}

大概就是这样了。对啦对啦，还有yahoo的weather格式：

首先了解Yahoo Weather Api的RSS Response格式：


   
   
    http://xml.weather.yahoo.com/ns/rss/1.0" xmlns:geo="
    http://www.w3.org/2003/01/geo/wgs84_pos#">  
    
         
     Yahoo! Weather - Tangshan, CH    
     http://us.rd.yahoo.com/dailynews/rss/weather/Tangshan__CH/*http://weather.yahoo.com/forecast/CHXX0131_f.html    
     
      Yahoo! Weather for Tangshan, CH
         
     
      en-us
         
     
      Fri, 22 Aug 2008 8:00 am CST
         
     
      60
         
         
         
         
         
         
           
     Yahoo! Weather      
     
      142
           
     
      18
           
     http://weather.yahoo.com      
     
      http://l.yimg.com/us.yimg.com/i/us/nws/th/main_142b.gif
             
     
            
      Conditions for Tangshan, CH at 8:00 am CST      
      
       39.63
            
      
       118.17
            
      http://us.rd.yahoo.com/dailynews/rss/weather/Tangshan__CH/*http://weather.yahoo.com/forecast/CHXX0131_f.html      
      
       Fri, 22 Aug 2008 8:00 am CST
            
            
      
               http://l.yimg.com/us.yimg.com/i/us/we/52/28.gif"/> />Current Conditions:
Mostly Cloudy, 67 F

Forecast:
Fri - Partly Cloudy. High: 86 Low: 69
Sat - Partly Cloudy. High: 88 Low: 70

Full">http://us.rd.yahoo.com/dailynews/rss/weather/Tangshan__CH/*http://weather.yahoo.com/forecast/CHXX0131_f.html">Full Forecast at Yahoo! Weather
(provided by The Weather Channel)
]]>      
            
            
            
      
       CHXX0131_2008_08_22_8_00_CST